print log
Browse files- app.py +2 -0
- vietTTS/nat/text2mel.py +1 -0
app.py
CHANGED
@@ -19,6 +19,8 @@ def text_to_speech(text):
|
|
19 |
"acoustic_latest_ckpt.pickle",
|
20 |
"duration_latest_ckpt.pickle",
|
21 |
)
|
|
|
|
|
22 |
wave = mel2wave(mel, "config.json", "hk_hifi.pickle")
|
23 |
print("wave")
|
24 |
print(wave)
|
|
|
19 |
"acoustic_latest_ckpt.pickle",
|
20 |
"duration_latest_ckpt.pickle",
|
21 |
)
|
22 |
+
print("mel")
|
23 |
+
print(mel)
|
24 |
wave = mel2wave(mel, "config.json", "hk_hifi.pickle")
|
25 |
print("wave")
|
26 |
print(wave)
|
vietTTS/nat/text2mel.py
CHANGED
@@ -89,6 +89,7 @@ def text2mel(
|
|
89 |
duration_ckpt=FLAGS.ckpt_dir / "duration_latest_ckpt.pickle",
|
90 |
):
|
91 |
tokens = text2tokens(text, lexicon_fn)
|
|
|
92 |
durations = predict_duration(tokens, duration_ckpt)
|
93 |
durations = jnp.where(
|
94 |
np.array(tokens)[None, :] == FLAGS.sil_index,
|
|
|
89 |
duration_ckpt=FLAGS.ckpt_dir / "duration_latest_ckpt.pickle",
|
90 |
):
|
91 |
tokens = text2tokens(text, lexicon_fn)
|
92 |
+
print("text2mel-token : " + tokens)
|
93 |
durations = predict_duration(tokens, duration_ckpt)
|
94 |
durations = jnp.where(
|
95 |
np.array(tokens)[None, :] == FLAGS.sil_index,
|