Spaces:
Runtime error
Runtime error
Vaibhav Srivastav
commited on
Commit
·
2ed8747
1
Parent(s):
f8a39ef
up
Browse files
app.py
CHANGED
@@ -31,6 +31,20 @@ SAMPLE_RATE = 24_000
|
|
31 |
|
32 |
vocos = Vocos.from_pretrained("charactr/vocos-encodec-24khz").to(device)
|
33 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
34 |
# import model
|
35 |
if device == "cpu":
|
36 |
bark = BarkModel.from_pretrained(HUB_PATH)
|
@@ -65,23 +79,19 @@ def generate_audio(text, voice_preset = None, lag = 0):
|
|
65 |
|
66 |
# Gradio blocks demo
|
67 |
with gr.Blocks() as demo_blocks:
|
68 |
-
gr.Markdown(
|
69 |
-
gr.
|
70 |
-
with gr.
|
71 |
-
|
72 |
-
|
73 |
-
with gr.Row():
|
74 |
-
spk = gr.Dropdown(
|
75 |
speaker_embeddings,
|
76 |
value=None,
|
77 |
label="Available voice presets",
|
78 |
info="Default: No speaker embeddings"
|
79 |
)
|
80 |
-
|
81 |
-
with gr.Row():
|
82 |
btn = gr.Button("Synthesise speech!")
|
83 |
|
84 |
-
with gr.
|
85 |
out_audio_vocos = gr.Audio(type="numpy", autoplay=False, label="Vocos enhanced speech", show_label=True)
|
86 |
|
87 |
btn.click(generate_audio, [inp_text, spk], [out_audio_vocos])
|
|
|
31 |
|
32 |
vocos = Vocos.from_pretrained("charactr/vocos-encodec-24khz").to(device)
|
33 |
|
34 |
+
title = "# 🐶 Bark with Charactr.ai's <a href='https://github.com/charactr-platform/vocos'>Vocos</a></div>"
|
35 |
+
|
36 |
+
description = """
|
37 |
+
<div>
|
38 |
+
<a style="display:inline-block" href='https://github.com/charactr-platform/vocos'><img src='https://img.shields.io/github/stars/charactr-platform/vocos?style=social' /></a>
|
39 |
+
<a style="display:inline-block; margin-left: 1em" href="https://huggingface.co/spaces/hf-audio/vocos-bark?duplicate=true"><img src="https://img.shields.io/badge/-Duplicate%20Space%20to%20skip%20the%20queue-blue?labelColor=white&style=flat&logo=data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAABAAAAAQCAYAAAAf8/9hAAAAAXNSR0IArs4c6QAAAP5JREFUOE+lk7FqAkEURY+ltunEgFXS2sZGIbXfEPdLlnxJyDdYB62sbbUKpLbVNhyYFzbrrA74YJlh9r079973psed0cvUD4A+4HoCjsA85X0Dfn/RBLBgBDxnQPfAEJgBY+A9gALA4tcbamSzS4xq4FOQAJgCDwV2CPKV8tZAJcAjMMkUe1vX+U+SMhfAJEHasQIWmXNN3abzDwHUrgcRGmYcgKe0bxrblHEB4E/pndMazNpSZGcsZdBlYJcEL9Afo75molJyM2FxmPgmgPqlWNLGfwZGG6UiyEvLzHYDmoPkDDiNm9JR9uboiONcBXrpY1qmgs21x1QwyZcpvxt9NS09PlsPAAAAAElFTkSuQmCC&logoWidth=14" alt="Duplicate Space"></a>
|
40 |
+
</div>
|
41 |
+
Bark is a universal text-to-audio model created by [Suno](www.suno.ai), with code publicly available [here](https://github.com/suno-ai/bark). \
|
42 |
+
Bark can generate highly realistic, multilingual speech as well as other audio - including music, background noise and simple sound effects. \
|
43 |
+
In this demo, we leverage charactr.ai's Vocos model to create high quality audio from bark. \
|
44 |
+
The model output is not censored and the authors do not endorse the opinions in the generated content. \
|
45 |
+
Use at your own risk.
|
46 |
+
"""
|
47 |
+
|
48 |
# import model
|
49 |
if device == "cpu":
|
50 |
bark = BarkModel.from_pretrained(HUB_PATH)
|
|
|
79 |
|
80 |
# Gradio blocks demo
|
81 |
with gr.Blocks() as demo_blocks:
|
82 |
+
gr.Markdown(title)
|
83 |
+
gr.Markdown(description)
|
84 |
+
with gr.column():
|
85 |
+
inp_text = gr.Textbox(label="What should Bark say?", info="Enter text here")
|
86 |
+
spk = gr.Dropdown(
|
|
|
|
|
87 |
speaker_embeddings,
|
88 |
value=None,
|
89 |
label="Available voice presets",
|
90 |
info="Default: No speaker embeddings"
|
91 |
)
|
|
|
|
|
92 |
btn = gr.Button("Synthesise speech!")
|
93 |
|
94 |
+
with gr.column():
|
95 |
out_audio_vocos = gr.Audio(type="numpy", autoplay=False, label="Vocos enhanced speech", show_label=True)
|
96 |
|
97 |
btn.click(generate_audio, [inp_text, spk], [out_audio_vocos])
|