Ailyth commited on
Commit
c283d94
·
verified ·
1 Parent(s): 2eccd3d

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +26 -15
app.py CHANGED
@@ -432,7 +432,11 @@ def get_tts_wav(ref_wav_path, prompt_text, prompt_language, text, text_language,
432
  if (text[-1] not in splits): text += "。" if text_language != "en" else "."
433
  print(("\n🎈实际输入的目标文本(每句):"), text)
434
  phones2, word2ph2, norm_text2 = get_cleaned_text_final(text, text_language)
435
- bert2 = get_bert_final(phones2, word2ph2, norm_text2, text_language, device).to(dtype)
 
 
 
 
436
  bert = torch.cat([bert1, bert2], 1)
437
 
438
  all_phoneme_ids = torch.LongTensor(phones1 + phones2).to(device).unsqueeze(0)
@@ -686,7 +690,7 @@ def clone_voice(user_voice,user_text,user_lang):
686
  if user_text == '':
687
  wprint("Please enter text to generate/请输入生成文字")
688
  return None
689
- #tprint('⚡Start clone')
690
  user_text=trim_text(user_text,user_lang)
691
  time1=timer()
692
  global gpt_path, sovits_path
@@ -724,18 +728,22 @@ with gr.Blocks(theme='Kasien/ali_theme_custom') as app:
724
  gr.HTML('''
725
  <h1 style="font-size: 25px;">A TTS GENERATOR</h1>
726
  <p style="margin-bottom: 10px; font-size: 100%">
727
- If you like this space, please click the ❤️ at the top of the page..如喜欢,请点一下页面顶部的❤️<br>
728
- 💡This space is based on the innovative text-to-speech generation solution
729
- <a href="https://github.com/RVC-Boss/GPT-SoVITS" target="_blank">GPT-SoVITS</a> .
 
730
  You can visit the repo's github homepage to learn training and inference.<br>
731
- 本空间基于新式的文字转语音生成方案 <a href="https://github.com/RVC-Boss/GPT-SoVITS" target="_blank">GPT-SoVITS</a> .
732
- 你可以前往项目的github主页学习如何推理和训练。<br>
733
- ✏️Generating voice is very slow due to using HuggingFace's free CPU in this space. For faster generation,
734
- click the Colab icon below to use this space in Colab, which will significantly improve the speed.<br>
735
- 由于本空间使用huggingface的免费CPU进行推理,因此速度很慢,如想快速生成,
736
- 请点击下方的Colab图标,前往Colab使用已获得更快的生成速度。
737
- </p>
738
- <a href="https://colab.research.google.com/drive/1fTuPZ4tZsAjS-TrhQWMCb7KRdnU8aF6j#scrollTo=MDtJIbLdLHe9" target="_blank"><img src="https://camo.githubusercontent.com/dd83d4a334eab7ada034c13747d9e2237182826d32e3fda6629740b6e02f18d8/68747470733a2f2f696d672e736869656c64732e696f2f62616467652f436f6c61622d4639414230303f7374796c653d666f722d7468652d6261646765266c6f676f3d676f6f676c65636f6c616226636f6c6f723d353235323532" alt="colab"></a>
 
 
 
739
  ''')
740
 
741
  default_voice_wav, default_voice_wav_words, default_language, _, default_model_name, _, default_tone_sample_path = update_model("Trump")
@@ -749,7 +757,9 @@ with gr.Blocks(theme='Kasien/ali_theme_custom') as app:
749
 
750
  plsh='Text must match the selected language option to prevent errors, for example, if English is input but Chinese is selected for generation.\n文字一定要和语言选项匹配,不然要报错,比如输入的是英文,生成语言选中文'
751
  limit='Max 70 words. Excess will be ignored./单次最多处理120字左���,多余的会被忽略'
752
-
 
 
753
  with gr.Row():
754
  model_name = gr.Textbox(label="Seleted Model/已选模型", value=default_model_name, scale=1)
755
  text = gr.Textbox(label="Input some text for voice generation/输入想要生成语音的文字", lines=5,scale=8,
@@ -794,7 +804,8 @@ with gr.Blocks(theme='Kasien/ali_theme_custom') as app:
794
  volume = gr.Slider(minimum=0.5, maximum=2, value=1, step=0.01, label='Volume/音量')
795
 
796
 
797
-
 
798
  with gr.Row():
799
  main_button = gr.Button("✨Generate Voice", variant="primary", scale=1)
800
  output = gr.Audio(label="💾Download it by clicking ⬇️", scale=3)
 
432
  if (text[-1] not in splits): text += "。" if text_language != "en" else "."
433
  print(("\n🎈实际输入的目标文本(每句):"), text)
434
  phones2, word2ph2, norm_text2 = get_cleaned_text_final(text, text_language)
435
+ try:
436
+ bert2 = get_bert_final(phones2, word2ph2, norm_text2, text_language, device).to(dtype)
437
+ except RuntimeError as e:
438
+ wprint(f"The input text does not match the language/输入文本与语言不匹配: {e}")
439
+ return None
440
  bert = torch.cat([bert1, bert2], 1)
441
 
442
  all_phoneme_ids = torch.LongTensor(phones1 + phones2).to(device).unsqueeze(0)
 
690
  if user_text == '':
691
  wprint("Please enter text to generate/请输入生成文字")
692
  return None
693
+ tprint('⚡Start clone')
694
  user_text=trim_text(user_text,user_lang)
695
  time1=timer()
696
  global gpt_path, sovits_path
 
728
  gr.HTML('''
729
  <h1 style="font-size: 25px;">A TTS GENERATOR</h1>
730
  <p style="margin-bottom: 10px; font-size: 100%">
731
+ If you like this space, please click the ❤️ at the top of the page..如喜欢,请点一下页面顶部的❤️<br>
732
+ </p>''')
733
+
734
+ gr.Markdown("""* This space is based on the text-to-speech generation solution GPT-SoVITS .
735
  You can visit the repo's github homepage to learn training and inference.<br>
736
+ 本空间基于文字转语音生成方案 GPT-SoVITS . 你可以前往项目的github主页学习如何推理和训练。
737
+ * ⚠️Generating voice is very slow due to using HuggingFace's free CPU in this space.
738
+ For faster generation, click the Colab icon below to use this space in Colab,
739
+ which will significantly improve the speed.<br>
740
+ 由于本空间使用huggingface的免费CPU进行推理,因此速度很慢,如想快速生成,请点击下方的Colab图标,
741
+ 前往Colab使用已获得更快的生成速度。
742
+ <br>Colabの使用を強くお勧めします。より速い生成速度が得られます。
743
+ * The model's corresponding language is its native language, but in fact,
744
+ each model can speak three languages.<br>模型对应的语言是其母语,但实际上,
745
+ 每个模型都能说三种语言<br>モデルに対応する言語はその母国語ですが、実際には、各モデルは3つの言語を話すことができます。""")
746
+ gr.HTML('''<a href="https://colab.research.google.com/drive/1fTuPZ4tZsAjS-TrhQWMCb7KRdnU8aF6j#scrollTo=MDtJIbLdLHe9" target="_blank"><img src="https://camo.githubusercontent.com/dd83d4a334eab7ada034c13747d9e2237182826d32e3fda6629740b6e02f18d8/68747470733a2f2f696d672e736869656c64732e696f2f62616467652f436f6c61622d4639414230303f7374796c653d666f722d7468652d6261646765266c6f676f3d676f6f676c65636f6c616226636f6c6f723d353235323532" alt="colab"></a>
747
  ''')
748
 
749
  default_voice_wav, default_voice_wav_words, default_language, _, default_model_name, _, default_tone_sample_path = update_model("Trump")
 
757
 
758
  plsh='Text must match the selected language option to prevent errors, for example, if English is input but Chinese is selected for generation.\n文字一定要和语言选项匹配,不然要报错,比如输入的是英文,生成语言选中文'
759
  limit='Max 70 words. Excess will be ignored./单次最多处理120字左���,多余的会被忽略'
760
+
761
+ gr.HTML('''
762
+ <b>输入文字</b>''')
763
  with gr.Row():
764
  model_name = gr.Textbox(label="Seleted Model/已选模型", value=default_model_name, scale=1)
765
  text = gr.Textbox(label="Input some text for voice generation/输入想要生成语音的文字", lines=5,scale=8,
 
804
  volume = gr.Slider(minimum=0.5, maximum=2, value=1, step=0.01, label='Volume/音量')
805
 
806
 
807
+ gr.HTML('''
808
+ <b>开始生成</b>''')
809
  with gr.Row():
810
  main_button = gr.Button("✨Generate Voice", variant="primary", scale=1)
811
  output = gr.Audio(label="💾Download it by clicking ⬇️", scale=3)