Spaces:
Build error
Build error
Commit
·
ebe9cbe
1
Parent(s):
7d0bff2
Add some more sample voice
Browse files- .vscode/settings.json +3 -0
- app.py +17 -7
- input/sample/Dwayne-Johnson-sample.wav +3 -0
- input/sample/Elon-Sample.wav +3 -0
- input/sample/Obama-sample.wav +3 -0
- output/output.wav +2 -2
.vscode/settings.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"cSpell.words": ["Elon"]
|
3 |
+
}
|
app.py
CHANGED
@@ -9,7 +9,7 @@ all_models = TTS.list_models()
|
|
9 |
# print(model)
|
10 |
|
11 |
# print("Using model: ", all_models[0])
|
12 |
-
|
13 |
# Init TTS
|
14 |
|
15 |
|
@@ -17,6 +17,8 @@ print("Downloading model...", '')
|
|
17 |
|
18 |
voiceCloneModel = TTS('tts_models/multilingual/multi-dataset/your_tts')
|
19 |
|
|
|
|
|
20 |
|
21 |
def run_cmd(command):
|
22 |
try:
|
@@ -36,27 +38,35 @@ def inference(text, speaker):
|
|
36 |
speaker = 'input/obama.mp3'
|
37 |
elif (speaker == 'Speaker-4'):
|
38 |
speaker = 'input/trump.wav'
|
|
|
|
|
|
|
|
|
|
|
|
|
39 |
else:
|
40 |
speaker = 'input/z-default.wav'
|
41 |
# print("speaker: ", speaker)
|
42 |
# cmd = ['tts', '--text', text, '--out_path', 'output/tts_output.wav']
|
43 |
# run_cmd(cmd)
|
44 |
# Text to speech to a file
|
45 |
-
# tts = TTS(
|
46 |
# progress_bar=False, gpu=True)
|
47 |
voiceCloneModel.tts_to_file(text, speaker_wav=speaker,
|
48 |
language="en", file_path="output/output.wav")
|
49 |
|
50 |
-
# for i in range(len(
|
51 |
-
#
|
52 |
-
#
|
53 |
|
54 |
return 'output/output.wav'
|
55 |
|
56 |
|
|
|
|
|
57 |
inputs = [gr.inputs.Textbox(lines=5, label="Input Text"),
|
58 |
-
gr.inputs.Dropdown(
|
59 |
-
|
60 |
]
|
61 |
outputs = gr.outputs.Audio(type="filepath", label="Output Audio")
|
62 |
title = "Text To Speech"
|
|
|
9 |
# print(model)
|
10 |
|
11 |
# print("Using model: ", all_models[0])
|
12 |
+
model = all_models[0]
|
13 |
# Init TTS
|
14 |
|
15 |
|
|
|
17 |
|
18 |
voiceCloneModel = TTS('tts_models/multilingual/multi-dataset/your_tts')
|
19 |
|
20 |
+
# tts = TTS("tts_models/de/thorsten/tacotron2-DDC")
|
21 |
+
|
22 |
|
23 |
def run_cmd(command):
|
24 |
try:
|
|
|
38 |
speaker = 'input/obama.mp3'
|
39 |
elif (speaker == 'Speaker-4'):
|
40 |
speaker = 'input/trump.wav'
|
41 |
+
elif (speaker == 'Rock'):
|
42 |
+
speaker = 'input/sample/Dwayne-Johnson-sample.wav'
|
43 |
+
elif (speaker == 'Elon'):
|
44 |
+
speaker = 'input/sample/Elon-Sample.wav'
|
45 |
+
elif (speaker == 'Obama'):
|
46 |
+
speaker = 'input/sample/Obama-sample.wav'
|
47 |
else:
|
48 |
speaker = 'input/z-default.wav'
|
49 |
# print("speaker: ", speaker)
|
50 |
# cmd = ['tts', '--text', text, '--out_path', 'output/tts_output.wav']
|
51 |
# run_cmd(cmd)
|
52 |
# Text to speech to a file
|
53 |
+
# tts = TTS(model="tts_models/multilingual/multi-dataset/your_tts",
|
54 |
# progress_bar=False, gpu=True)
|
55 |
voiceCloneModel.tts_to_file(text, speaker_wav=speaker,
|
56 |
language="en", file_path="output/output.wav")
|
57 |
|
58 |
+
# for i in range(len(model.languages)):
|
59 |
+
# model.tts_to_file(text=text,
|
60 |
+
# speaker=model.speakers[i], language=model.languages[0], file_path='output/output-'+str(i)+'.wav')
|
61 |
|
62 |
return 'output/output.wav'
|
63 |
|
64 |
|
65 |
+
sampleInput = ['Speaker-1', 'Speaker-2', 'Speaker-3',
|
66 |
+
'Speaker-4', 'Rock', 'Elon', 'Obama']
|
67 |
inputs = [gr.inputs.Textbox(lines=5, label="Input Text"),
|
68 |
+
gr.inputs.Dropdown(
|
69 |
+
sampleInput, label="Sample Input", default="Speaker-1",)
|
70 |
]
|
71 |
outputs = gr.outputs.Audio(type="filepath", label="Output Audio")
|
72 |
title = "Text To Speech"
|
input/sample/Dwayne-Johnson-sample.wav
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f3c3d9d61a817cc459f890867c584a0496245c81b747205b48c18b49b6723d8b
|
3 |
+
size 1578042
|
input/sample/Elon-Sample.wav
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a6609e4b4c5a8ce77eff174fd2eca989ded8a28fd2ca5b1866035fd54247649b
|
3 |
+
size 1233978
|
input/sample/Obama-sample.wav
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6dec4bb97019439e01a8909d68f5704e0e2c6de12c57865f3d4a01132519c045
|
3 |
+
size 930874
|
output/output.wav
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:07abadaef514caf57a002e76da940e5900a6851ccba39076c3e7eb4359fdf82d
|
3 |
+
size 1364620
|