Vaibhav Srivastav commited on
Commit
2ed8747
·
1 Parent(s): f8a39ef
Files changed (1) hide show
  1. app.py +20 -10
app.py CHANGED
@@ -31,6 +31,20 @@ SAMPLE_RATE = 24_000
31
 
32
  vocos = Vocos.from_pretrained("charactr/vocos-encodec-24khz").to(device)
33
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
34
  # import model
35
  if device == "cpu":
36
  bark = BarkModel.from_pretrained(HUB_PATH)
@@ -65,23 +79,19 @@ def generate_audio(text, voice_preset = None, lag = 0):
65
 
66
  # Gradio blocks demo
67
  with gr.Blocks() as demo_blocks:
68
- gr.Markdown("""<h1 align="center">🐶 Bark with Vocos</h1>""")
69
- gr.HTML("""<h3 style="text-align:center;">📢 Vocos-enhanced TTS 🦾! </h3>""")
70
- with gr.Group():
71
- with gr.Row():
72
- inp_text = gr.Textbox(label="What should Bark say?", info="Enter text here")
73
- with gr.Row():
74
- spk = gr.Dropdown(
75
  speaker_embeddings,
76
  value=None,
77
  label="Available voice presets",
78
  info="Default: No speaker embeddings"
79
  )
80
-
81
- with gr.Row():
82
  btn = gr.Button("Synthesise speech!")
83
 
84
- with gr.Row():
85
  out_audio_vocos = gr.Audio(type="numpy", autoplay=False, label="Vocos enhanced speech", show_label=True)
86
 
87
  btn.click(generate_audio, [inp_text, spk], [out_audio_vocos])
 
31
 
32
  vocos = Vocos.from_pretrained("charactr/vocos-encodec-24khz").to(device)
33
 
34
+ title = "# 🐶 Bark with Charactr.ai's <a href='https://github.com/charactr-platform/vocos'>Vocos</a></div>"
35
+
36
+ description = """
37
+ <div>
38
+ <a style="display:inline-block" href='https://github.com/charactr-platform/vocos'><img src='https://img.shields.io/github/stars/charactr-platform/vocos?style=social' /></a>
39
+ <a style="display:inline-block; margin-left: 1em" href="https://huggingface.co/spaces/hf-audio/vocos-bark?duplicate=true"><img src="https://img.shields.io/badge/-Duplicate%20Space%20to%20skip%20the%20queue-blue?labelColor=white&style=flat&logo=data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAABAAAAAQCAYAAAAf8/9hAAAAAXNSR0IArs4c6QAAAP5JREFUOE+lk7FqAkEURY+ltunEgFXS2sZGIbXfEPdLlnxJyDdYB62sbbUKpLbVNhyYFzbrrA74YJlh9r079973psed0cvUD4A+4HoCjsA85X0Dfn/RBLBgBDxnQPfAEJgBY+A9gALA4tcbamSzS4xq4FOQAJgCDwV2CPKV8tZAJcAjMMkUe1vX+U+SMhfAJEHasQIWmXNN3abzDwHUrgcRGmYcgKe0bxrblHEB4E/pndMazNpSZGcsZdBlYJcEL9Afo75molJyM2FxmPgmgPqlWNLGfwZGG6UiyEvLzHYDmoPkDDiNm9JR9uboiONcBXrpY1qmgs21x1QwyZcpvxt9NS09PlsPAAAAAElFTkSuQmCC&logoWidth=14" alt="Duplicate Space"></a>
40
+ </div>
41
+ Bark is a universal text-to-audio model created by [Suno](www.suno.ai), with code publicly available [here](https://github.com/suno-ai/bark). \
42
+ Bark can generate highly realistic, multilingual speech as well as other audio - including music, background noise and simple sound effects. \
43
+ In this demo, we leverage charactr.ai's Vocos model to create high quality audio from bark. \
44
+ The model output is not censored and the authors do not endorse the opinions in the generated content. \
45
+ Use at your own risk.
46
+ """
47
+
48
  # import model
49
  if device == "cpu":
50
  bark = BarkModel.from_pretrained(HUB_PATH)
 
79
 
80
  # Gradio blocks demo
81
  with gr.Blocks() as demo_blocks:
82
+ gr.Markdown(title)
83
+ gr.Markdown(description)
84
+ with gr.column():
85
+ inp_text = gr.Textbox(label="What should Bark say?", info="Enter text here")
86
+ spk = gr.Dropdown(
 
 
87
  speaker_embeddings,
88
  value=None,
89
  label="Available voice presets",
90
  info="Default: No speaker embeddings"
91
  )
 
 
92
  btn = gr.Button("Synthesise speech!")
93
 
94
+ with gr.column():
95
  out_audio_vocos = gr.Audio(type="numpy", autoplay=False, label="Vocos enhanced speech", show_label=True)
96
 
97
  btn.click(generate_audio, [inp_text, spk], [out_audio_vocos])