Spaces:

gianTheo
/

Greek-Transcription

Sleeping

App Files Files Community

gianTheo commited on Nov 28, 2023

Commit

7e7af56

1 Parent(s): 4e08dc5

Update app.py

Browse files

Files changed (1) hide show

app.py +49 -7

app.py CHANGED Viewed

@@ -1,18 +1,60 @@
 from transformers import pipeline
 import gradio as gr
-pipe = pipeline(model="farsipal/whisper-small-el")  # change to "your-username/the-name-you-picked"
 def transcribe(audio):
     text = pipe(audio)["text"]
     return text
-iface = gr.Interface(
-    fn=transcribe,
-    inputs=gr.Audio(sources="microphone", type="filepath"),
     outputs="text",
-    title="Whisper Greek Transcription",
-    description="Realtime demo for Greek speech recognition using a fine-tuned Whisper model.",
 )
-iface.launch()

 from transformers import pipeline
 import gradio as gr
+import torch
+import pytube as pt
+checkpoint = "farsipal/whisper-small-el"
+device = 0 if torch.cuda.is_available() else "cpu"
+print(device)
+pipe = pipeline(task = "automatic-speech-recognition", model = checkpoint,chunk_length_s=30,device = device)
 def transcribe(audio):
     text = pipe(audio)["text"]
     return text
+def transcribe_url(yt_url):
+  yt = pt.YouTube(yt_url)
+  stream = yt.streams.filter(only_audio=True)[0]
+  stream.download(filename = "audio.mp3")
+  text = pipe("audio.mp3")["text"]
+  return text
+demo = gr.Blocks()
+microphone_interface = gr.Interface(
+    fn=transcribe,
+    inputs = gr.Audio(sources="microphone", type="filepath"),
     outputs="text",
+    title="Whisper Small Greek Finetuned raw microphone audio",
+    description="Realtime demo for Greek speech recognition using a fine-tuned Whisper small model."
 )
+file_interface = gr.Interface(
+    fn=transcribe,
+    inputs = gr.Audio(sources="upload", type="filepath"),
+    outputs="text",
+    title="Whisper Small Greek Finetuned for audio file.",
+    description="Realtime demo for Greek speech recognition using a fine-tuned Whisper small model."
+)
+url_interface = gr.Interface(
+    fn = transcribe_url,
+    inputs = gr.Textbox(lines=1, placeholder="Paste the URL to a YouTube video here", label="YouTube URL"),
+    outputs = "text",
+    title = "Whisper Small Greek Finetuned for URL transcription",
+    description = "Realtime demo for Greek speech recognition using a fine-tuned Whisper small model."
+)
+with demo:
+    gr.TabbedInterface([microphone_interface,file_interface, url_interface], ["Transcribe Audio", "Transcribe File" , "Transcribe YouTube"])
+demo.launch(share=True)