thealphamerc commited on
Commit
ebe9cbe
·
1 Parent(s): 7d0bff2

Add some more sample voice

Browse files
.vscode/settings.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "cSpell.words": ["Elon"]
3
+ }
app.py CHANGED
@@ -9,7 +9,7 @@ all_models = TTS.list_models()
9
  # print(model)
10
 
11
  # print("Using model: ", all_models[0])
12
- model_name = all_models[0]
13
  # Init TTS
14
 
15
 
@@ -17,6 +17,8 @@ print("Downloading model...", '')
17
 
18
  voiceCloneModel = TTS('tts_models/multilingual/multi-dataset/your_tts')
19
 
 
 
20
 
21
  def run_cmd(command):
22
  try:
@@ -36,27 +38,35 @@ def inference(text, speaker):
36
  speaker = 'input/obama.mp3'
37
  elif (speaker == 'Speaker-4'):
38
  speaker = 'input/trump.wav'
 
 
 
 
 
 
39
  else:
40
  speaker = 'input/z-default.wav'
41
  # print("speaker: ", speaker)
42
  # cmd = ['tts', '--text', text, '--out_path', 'output/tts_output.wav']
43
  # run_cmd(cmd)
44
  # Text to speech to a file
45
- # tts = TTS(model_name="tts_models/multilingual/multi-dataset/your_tts",
46
  # progress_bar=False, gpu=True)
47
  voiceCloneModel.tts_to_file(text, speaker_wav=speaker,
48
  language="en", file_path="output/output.wav")
49
 
50
- # for i in range(len(tts.languages)):
51
- # tts.tts_to_file(text=text,
52
- # speaker=tts.speakers[i], language=tts.languages[0], file_path='output/output-'+str(i)+'.wav')
53
 
54
  return 'output/output.wav'
55
 
56
 
 
 
57
  inputs = [gr.inputs.Textbox(lines=5, label="Input Text"),
58
- gr.inputs.Dropdown(['Speaker-1', 'Speaker-2', 'Speaker-3',
59
- 'Speaker-4'], label="Model")
60
  ]
61
  outputs = gr.outputs.Audio(type="filepath", label="Output Audio")
62
  title = "Text To Speech"
 
9
  # print(model)
10
 
11
  # print("Using model: ", all_models[0])
12
+ model = all_models[0]
13
  # Init TTS
14
 
15
 
 
17
 
18
  voiceCloneModel = TTS('tts_models/multilingual/multi-dataset/your_tts')
19
 
20
+ # tts = TTS("tts_models/de/thorsten/tacotron2-DDC")
21
+
22
 
23
  def run_cmd(command):
24
  try:
 
38
  speaker = 'input/obama.mp3'
39
  elif (speaker == 'Speaker-4'):
40
  speaker = 'input/trump.wav'
41
+ elif (speaker == 'Rock'):
42
+ speaker = 'input/sample/Dwayne-Johnson-sample.wav'
43
+ elif (speaker == 'Elon'):
44
+ speaker = 'input/sample/Elon-Sample.wav'
45
+ elif (speaker == 'Obama'):
46
+ speaker = 'input/sample/Obama-sample.wav'
47
  else:
48
  speaker = 'input/z-default.wav'
49
  # print("speaker: ", speaker)
50
  # cmd = ['tts', '--text', text, '--out_path', 'output/tts_output.wav']
51
  # run_cmd(cmd)
52
  # Text to speech to a file
53
+ # tts = TTS(model="tts_models/multilingual/multi-dataset/your_tts",
54
  # progress_bar=False, gpu=True)
55
  voiceCloneModel.tts_to_file(text, speaker_wav=speaker,
56
  language="en", file_path="output/output.wav")
57
 
58
+ # for i in range(len(model.languages)):
59
+ # model.tts_to_file(text=text,
60
+ # speaker=model.speakers[i], language=model.languages[0], file_path='output/output-'+str(i)+'.wav')
61
 
62
  return 'output/output.wav'
63
 
64
 
65
+ sampleInput = ['Speaker-1', 'Speaker-2', 'Speaker-3',
66
+ 'Speaker-4', 'Rock', 'Elon', 'Obama']
67
  inputs = [gr.inputs.Textbox(lines=5, label="Input Text"),
68
+ gr.inputs.Dropdown(
69
+ sampleInput, label="Sample Input", default="Speaker-1",)
70
  ]
71
  outputs = gr.outputs.Audio(type="filepath", label="Output Audio")
72
  title = "Text To Speech"
input/sample/Dwayne-Johnson-sample.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3c3d9d61a817cc459f890867c584a0496245c81b747205b48c18b49b6723d8b
3
+ size 1578042
input/sample/Elon-Sample.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6609e4b4c5a8ce77eff174fd2eca989ded8a28fd2ca5b1866035fd54247649b
3
+ size 1233978
input/sample/Obama-sample.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6dec4bb97019439e01a8909d68f5704e0e2c6de12c57865f3d4a01132519c045
3
+ size 930874
output/output.wav CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ddd247a0b637133326079fa149c85c8544671c92c0c7a78ec93952db3cc0dfb2
3
- size 132172
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:07abadaef514caf57a002e76da940e5900a6851ccba39076c3e7eb4359fdf82d
3
+ size 1364620