TTS-toolbox

Runtime error

App Files Files Community

clementruhm commited on Oct 4, 2022

Commit

53f8a32

•

1 Parent(s): 88ef979

Initial commit

Browse files

Files changed (5) hide show

.gitignore +1 -0
README.md +5 -5
app.py +101 -0
requirements.txt +5 -0
setup.cfg +12 -0

.gitignore ADDED Viewed

	@@ -0,0 +1 @@


1	+ .idea

README.md CHANGED Viewed

@@ -1,12 +1,12 @@
 ---
-title: Tts
-emoji: 📉
-colorFrom: pink
-colorTo: blue
 sdk: gradio
 sdk_version: 3.4
 app_file: app.py
 pinned: false
 ---
-Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

 ---
+title: Text-to-Speech
+emoji: 💬
+colorFrom: blue
+colorTo: yellow
 sdk: gradio
 sdk_version: 3.4
 app_file: app.py
 pinned: false
 ---
+Text-to-Speech interactive demo, using (balacoon_tts)[https://balacoon.com].

app.py ADDED Viewed

	@@ -0,0 +1,101 @@

+"""
+Copyright 2022 Balacoon
+TTS interactive demo
+"""
+import logging
+from typing import cast
+import gradio as gr
+from balacoon_tts import TTS
+from huggingface_hub import hf_hub_download, list_repo_files
+# global tts module, initialized from a model selected
+tts = None
+def main():
+    logging.basicConfig(level=logging.INFO)
+    with gr.Blocks() as demo:
+        gr.Markdown(
+            """
+            <h1 align="center">Balacoon🦝 Text-to-Speech</h1>
+            1. Write an utterance to generate,
+            2. Select the model to synthesize with
+            3. Select speaker (only for multi-speaker models)
+            4. Hit "Generate" and listen to the result!
+            When you select model for the first time,
+            it will take around 30 seconds to download it.
+            You can learn more about models available
+            [here](https://huggingface.co/balacoon/tts),
+            visit [Balacoon website](https://balacoon.com/) for more info.
+            """
+        )
+        with gr.Row():
+            text = gr.Textbox(label="Text", placeholder="Type something here...")
+        with gr.Row():
+            with gr.Column():
+                repo_files = list_repo_files(repo_id="balacoon/tts")
+                model_files = [x for x in repo_files if x.endswith(".addon")]
+                model_name = gr.Dropdown(
+                    label="Model",
+                    choices=model_files,
+                )
+            with gr.Column():
+                speaker = gr.Dropdown(label="Speaker", choices=[])
+            def set_model(model_name_str: str):
+                """
+                gets value from `model_name`, loads model,
+                re-initializes tts object, gets list of
+                speakers that model supports and set them to `speaker`
+                """
+                model_path = hf_hub_download(
+                    repo_id="balacoon/tts", filename=model_name_str
+                )
+                global tts
+                tts = TTS(model_path)
+                speakers = tts.get_speakers()
+                if speakers:
+                    visible = True
+                    value = speakers[-1]
+                else:
+                    visible = False
+                    value = ""
+                return gr.Dropdown.update(
+                    choices=speakers, value=value, visible=visible
+                )
+            model_name.change(set_model, inputs=model_name, outputs=speaker)
+        with gr.Row():
+            generate = gr.Button("Generate")
+        with gr.Row():
+            audio = gr.Audio()
+        def synthesize_audio(text_str: str, speaker_str: str = ""):
+            """
+            gets utterance to synthesize from `text` Textbox
+            and speaker name from `speaker` dropdown list.
+            speaker name might be empty for single-speaker models.
+            Synthesizes the waveform and updates `audio` with it.
+            """
+            if not text_str:
+                logging.info("text or speaker are not provided")
+                return None
+            global tts
+            samples = cast(TTS, tts).synthesize(text_str, speaker_str)
+            return gr.Audio.update(value=(24000, samples))
+        generate.click(synthesize_audio, inputs=[text, speaker], outputs=audio)
+    demo.launch()
+if __name__ == "__main__":
+    main()

requirements.txt ADDED Viewed

	@@ -0,0 +1,5 @@

+--index-url https://pypi.fury.io/balacoon/
+--extra-index-url https://pypi.org/simple/
+balacoon-tts==0.0.1
+huggingface_hub
+numpy

setup.cfg ADDED Viewed

	@@ -0,0 +1,12 @@

+[flake8]
+max_complexity=10
+per-file-ignores=__init__.py:F401,F403
+ignore = E203,W503
+max-line-length=119
+[isort]
+profile=black
+line_length=119
+[mypy]
+ignore_missing_imports = True