move data.py and rename some files
This commit is contained in:
parent
c8482a0788
commit
5ad005fd9a
|
@ -132,7 +132,7 @@ dmypy.json
|
||||||
.pyre/
|
.pyre/
|
||||||
|
|
||||||
# Shell, vim, and output folder
|
# Shell, vim, and output folder
|
||||||
*.sh
|
#*.sh
|
||||||
*.swp
|
*.swp
|
||||||
runs
|
runs
|
||||||
syn_audios
|
syn_audios
|
||||||
|
|
|
@ -13,10 +13,12 @@ from tensorboardX import SummaryWriter
|
||||||
import paddle.fluid.dygraph as dg
|
import paddle.fluid.dygraph as dg
|
||||||
import paddle.fluid.layers as layers
|
import paddle.fluid.layers as layers
|
||||||
import paddle.fluid as fluid
|
import paddle.fluid as fluid
|
||||||
from parakeet.models.dataloader.ljspeech import LJSpeechLoader
|
from parakeet.models.transformer_tts.transformer_tts import TransformerTTS
|
||||||
from parakeet.models.transformer_tts.transformerTTS import TransformerTTS
|
|
||||||
from parakeet.models.fastspeech.fastspeech import FastSpeech
|
from parakeet.models.fastspeech.fastspeech import FastSpeech
|
||||||
from parakeet.models.fastspeech.utils import get_alignment
|
from parakeet.models.fastspeech.utils import get_alignment
|
||||||
|
import sys
|
||||||
|
sys.path.append("../transformer_tts")
|
||||||
|
from data import LJSpeechLoader
|
||||||
|
|
||||||
def load_checkpoint(step, model_path):
|
def load_checkpoint(step, model_path):
|
||||||
model_dict, opti_dict = fluid.dygraph.load_dygraph(os.path.join(model_path, step))
|
model_dict, opti_dict = fluid.dygraph.load_dygraph(os.path.join(model_path, step))
|
||||||
|
|
|
@ -1,4 +1,3 @@
|
||||||
|
|
||||||
# train model
|
# train model
|
||||||
# if you wish to resume from an exists model, uncomment --checkpoint_path and --fastspeech_step
|
# if you wish to resume from an exists model, uncomment --checkpoint_path and --fastspeech_step
|
||||||
#CUDA_VISIBLE_DEVICES=0,1,2,3 \
|
#CUDA_VISIBLE_DEVICES=0,1,2,3 \
|
||||||
|
|
|
@ -14,7 +14,7 @@ from pprint import pprint
|
||||||
from collections import OrderedDict
|
from collections import OrderedDict
|
||||||
from parakeet import audio
|
from parakeet import audio
|
||||||
from parakeet.models.transformer_tts.vocoder import Vocoder
|
from parakeet.models.transformer_tts.vocoder import Vocoder
|
||||||
from parakeet.models.transformer_tts.transformerTTS import TransformerTTS
|
from parakeet.models.transformer_tts.transformer_tts import TransformerTTS
|
||||||
|
|
||||||
def load_checkpoint(step, model_path):
|
def load_checkpoint(step, model_path):
|
||||||
model_dict, _ = fluid.dygraph.load_dygraph(os.path.join(model_path, step))
|
model_dict, _ = fluid.dygraph.load_dygraph(os.path.join(model_path, step))
|
||||||
|
|
|
@ -13,8 +13,8 @@ import paddle.fluid as fluid
|
||||||
import paddle.fluid.dygraph as dg
|
import paddle.fluid.dygraph as dg
|
||||||
import paddle.fluid.layers as layers
|
import paddle.fluid.layers as layers
|
||||||
from parakeet.modules.utils import cross_entropy
|
from parakeet.modules.utils import cross_entropy
|
||||||
from parakeet.models.dataloader.ljspeech import LJSpeechLoader
|
from data import LJSpeechLoader
|
||||||
from parakeet.models.transformer_tts.transformerTTS import TransformerTTS
|
from parakeet.models.transformer_tts.transformer_tts import TransformerTTS
|
||||||
|
|
||||||
def load_checkpoint(step, model_path):
|
def load_checkpoint(step, model_path):
|
||||||
model_dict, opti_dict = fluid.dygraph.load_dygraph(os.path.join(model_path, step))
|
model_dict, opti_dict = fluid.dygraph.load_dygraph(os.path.join(model_path, step))
|
||||||
|
|
|
@ -10,7 +10,7 @@ from pprint import pprint
|
||||||
import paddle.fluid as fluid
|
import paddle.fluid as fluid
|
||||||
import paddle.fluid.dygraph as dg
|
import paddle.fluid.dygraph as dg
|
||||||
import paddle.fluid.layers as layers
|
import paddle.fluid.layers as layers
|
||||||
from parakeet.models.dataloader.ljspeech import LJSpeechLoader
|
from data import LJSpeechLoader
|
||||||
from parakeet.models.transformer_tts.vocoder import Vocoder
|
from parakeet.models.transformer_tts.vocoder import Vocoder
|
||||||
|
|
||||||
def load_checkpoint(step, model_path):
|
def load_checkpoint(step, model_path):
|
||||||
|
|
|
@ -1,7 +1,7 @@
|
||||||
import paddle.fluid.dygraph as dg
|
import paddle.fluid.dygraph as dg
|
||||||
import paddle.fluid as fluid
|
import paddle.fluid as fluid
|
||||||
from parakeet.modules.utils import *
|
from parakeet.modules.utils import *
|
||||||
from parakeet.models.fastspeech.FFTBlock import FFTBlock
|
from parakeet.models.fastspeech.fft_block import FFTBlock
|
||||||
|
|
||||||
class Decoder(dg.Layer):
|
class Decoder(dg.Layer):
|
||||||
def __init__(self,
|
def __init__(self,
|
||||||
|
|
|
@ -1,7 +1,7 @@
|
||||||
import paddle.fluid.dygraph as dg
|
import paddle.fluid.dygraph as dg
|
||||||
import paddle.fluid as fluid
|
import paddle.fluid as fluid
|
||||||
from parakeet.modules.utils import *
|
from parakeet.modules.utils import *
|
||||||
from parakeet.models.fastspeech.FFTBlock import FFTBlock
|
from parakeet.models.fastspeech.fft_block import FFTBlock
|
||||||
|
|
||||||
class Encoder(dg.Layer):
|
class Encoder(dg.Layer):
|
||||||
def __init__(self,
|
def __init__(self,
|
||||||
|
|
|
@ -3,7 +3,7 @@ import paddle.fluid.dygraph as dg
|
||||||
import paddle.fluid as fluid
|
import paddle.fluid as fluid
|
||||||
from parakeet.g2p.text.symbols import symbols
|
from parakeet.g2p.text.symbols import symbols
|
||||||
from parakeet.models.transformer_tts.post_convnet import PostConvNet
|
from parakeet.models.transformer_tts.post_convnet import PostConvNet
|
||||||
from parakeet.models.fastspeech.LengthRegulator import LengthRegulator
|
from parakeet.models.fastspeech.length_regulator import LengthRegulator
|
||||||
from parakeet.models.fastspeech.encoder import Encoder
|
from parakeet.models.fastspeech.encoder import Encoder
|
||||||
from parakeet.models.fastspeech.decoder import Decoder
|
from parakeet.models.fastspeech.decoder import Decoder
|
||||||
|
|
||||||
|
|
|
@ -11,16 +11,9 @@ class TransformerTTS(dg.Layer):
|
||||||
self.config = config
|
self.config = config
|
||||||
|
|
||||||
def forward(self, characters, mel_input, pos_text, pos_mel):
|
def forward(self, characters, mel_input, pos_text, pos_mel):
|
||||||
# key (batch_size, seq_len, channel)
|
|
||||||
# c_mask (batch_size, seq_len)
|
|
||||||
# attns_enc (channel / 2, seq_len, seq_len)
|
|
||||||
|
|
||||||
key, c_mask, attns_enc = self.encoder(characters, pos_text)
|
key, c_mask, attns_enc = self.encoder(characters, pos_text)
|
||||||
|
|
||||||
# mel_output/postnet_output (batch_size, mel_len, n_mel)
|
|
||||||
# attn_probs (128, mel_len, seq_len)
|
|
||||||
# stop_preds (batch_size, mel_len, 1)
|
|
||||||
# attns_dec (128, mel_len, mel_len)
|
|
||||||
mel_output, postnet_output, attn_probs, stop_preds, attns_dec = self.decoder(key, key, mel_input, c_mask, pos_mel)
|
mel_output, postnet_output, attn_probs, stop_preds, attns_dec = self.decoder(key, key, mel_input, c_mask, pos_mel)
|
||||||
|
|
||||||
return mel_output, postnet_output, attn_probs, stop_preds, attns_enc, attns_dec
|
return mel_output, postnet_output, attn_probs, stop_preds, attns_enc, attns_dec
|
|
@ -2,7 +2,7 @@ import paddle.fluid.dygraph as dg
|
||||||
import paddle.fluid as fluid
|
import paddle.fluid as fluid
|
||||||
from parakeet.modules.customized import Conv1D
|
from parakeet.modules.customized import Conv1D
|
||||||
from parakeet.modules.utils import *
|
from parakeet.modules.utils import *
|
||||||
from parakeet.models.transformer_tts.CBHG import CBHG
|
from parakeet.models.transformer_tts.cbhg import CBHG
|
||||||
|
|
||||||
class Vocoder(dg.Layer):
|
class Vocoder(dg.Layer):
|
||||||
"""
|
"""
|
||||||
|
|
Loading…
Reference in New Issue