Spaces:

tobiccino
/

tts

Sleeping

File size: 4,990 Bytes

from vietTTS.hifigan.mel2wave import mel2wave
from vietTTS.nat.text2mel import text2mel
from vietTTS.synthesizer import nat_normalize_text
import numpy as np
import gradio as gr
import os


def text_to_speech(text,stop_duration):
    print("starting")
    # prevent too long text
    if len(text) > 500:
        text = text[:500]
    # stop_duration_float = float(stop_duration_text)
    text = clean_text(text)
    text = nat_normalize_text(text)
    mel = text2mel(
        text,
        "lexicon.txt",
        stop_duration,
        "acoustic_latest_ckpt.pickle",
        "duration_latest_ckpt.pickle",
    )
    wave = mel2wave(mel, "config.json", "hk_hifi.pickle")
    return (wave * (2**15)).astype(np.int16)


def speak(text,stop_duration):
    y = text_to_speech(text,stop_duration)
    return 16_000, y



def clean_text(test_string):
  list_word = test_string.split()
  # print(list_word)

  regex = r"\d{2}(?P<sep>[-/])\d{1,2}(?P=sep)\d{4}"

  for word in list_word :
    try:
      # print(word)
      searchbox_result = re.match(regex, word)
      day = searchbox_result.group(0)
      day2 = day
      day2 = day2.replace('/',' ').replace('-',' ')
      list_date = day2.split(' ')
      date_result = 'Ngày ' + n2w(list_date[0]) + ' tháng ' + n2w(list_date[1].replace('0','') if list_date[1].startswith('0') else list_date[1]) + ' năm ' + n2w(list_date[2])
      # print(date_result)
      test_string = test_string.replace(word, date_result)

    except AttributeError:
      # print(word) 
      # print("can't make a group")
      continue


  # print(test_string)

  regex2 = r"\d{2}(?P<sep>[-/])\d{1,2}"

  for word in list_word :
    try:
      # print(word)
      searchbox_result = re.match(regex2, word)
      day = searchbox_result.group(0)
      day2 = day
      day2 = day2.replace('/',' ').replace('-',' ')
      list_date = day2.split(' ')
      date_result = 'Ngày ' + n2w(list_date[0]) + ' tháng ' + n2w(list_date[1].replace('0','') if list_date[1].startswith('0') else list_date[1])
      # print(date_result)
      test_string = test_string.replace(word, date_result)

    except AttributeError:
      # print(word) 
      # print("can't make a group")
      continue


  # print(test_string)

  regex3 = r"\d{1,2}(?P<sep>[h:])\d{1,2}"

  for word in list_word :
    try:
      # print(word)
      searchbox_result = re.match(regex3, word)
      day = searchbox_result.group(0)
      day2 = day
      day2 = day2.replace('h',' ').replace(':',' ')
      list_date = day2.split(' ')
      date_result = n2w(list_date[0]) + ' giờ ' + n2w(list_date[1].replace('0','') if list_date[1].startswith('0') else list_date[1]) + ' phút '
      # print(date_result)
      test_string = test_string.replace(word, date_result)

    except AttributeError:
      # print(word) 
      # print("can't make a group")
      continue


  print(test_string)

  for word in list_word :
    try:
      if word.isdigit() :
        # print(word)
        text_result = n2w_single(word)
        # print(text_result)
        test_string = test_string.replace(word, text_result, 1)

    except AttributeError:
      # print(word) 
      print("can't make a group")
      continue


  return test_string


title = "SLT TTS"
description = "SLT Vietnamese Text to speech demo."

gr.Interface(
    fn=speak, 
    inputs=["text","number"],
    outputs="audio",
    title = title,
    examples = [
    ["Thành phố muốn thí điểm thu thuế bất động sản thứ 2, tự quyết nhiều quyết định đầu tư để thu hút nguồn vốn tư nhân",0.2],
    ["Thứ năm, 22/12/2022, 10:59 những mét hàng rào đầu tiên quanh công viên lớn nhất thủ đô được tháo dỡ, chuyển công viên sang hình thức mở, không thu vé.",0.2],
    ["Cô dì chú bác nhà em không học hành vì vẫn làm bất động sản. Có phải làm ngành này thì chỉ cần biết sơ sơ, không cần học hành?... Đó là vấn đề được học sinh trường Trung học phổ thông  Gia Định, Thành phố Hồ Chí Minh đặt ra tại buổi khai mạc chương trình tư vấn tuyển sinh do Tạp chí Giáo dục Thành phố Hồ Chí Minh tổ chức sáng mồng 9 tháng 1.",0.2],
    ["Trong chuyến công du nước ngoài thứ hai từ khi Nga phát động chiến dịch quân sự tại Ukraine gần 12 tháng trước, Tổng thống Volodymyr Zelensky dự kiến phát biểu tại Nghị viện châu Âu ngày 9/2",0.2],
    ["Tuy nhiên, kế hoạch này đang đứng trước nguy cơ đổ vỡ sau khi các quan chức Nghị viện châu âu làm rò rỉ kế hoạch bí mật tiếp đón Tổng thống Ukraine. Hồi đầu tuần, thông tin về chuyến thăm xuất hiện trên nhiều tờ báo châu âu, khởi nguồn từ báo La Stampa của Italy.",0.2]
    ],
    description=description,
    theme="default",
    allow_screenshot=False,
    allow_flagging="never",
).launch(debug=False)