Spaces:

jlvdoorn
/

WhisperATC

Running

jlvdoorn commited on Aug 30, 2023

Commit

083757a

•

1 Parent(s): be31eba

Changed to a single input (audio file)

Files changed (1) hide show

app.py CHANGED Viewed

@@ -9,11 +9,9 @@ whisper = pipeline(model='jlvdoorn/whisper-large-v2-atco2-asr-atcosim', use_auth
 # bert_atco_ner = pipeline(model='Jzuluaga/bert-base-ner-atc-en-atco2-1h')
 #%%
-def transcribe(audio_mic, audio_file):
     if audio_file is not None:
         return whisper(audio_file)['text']
-    if audio_mic is not None:
-        return whisper(audio_mic)['text']
     else:
         return 'There was no audio to transcribe...'
@@ -48,7 +46,7 @@ def transcribe(audio_mic, audio_file):
 #%%
 iface = gr.Interface(
         fn=transcribe,
-        inputs=[gr.Audio(source='microphone', type='filepath'), gr.Audio(source='upload', type='filepath')],
         outputs=gr.Text(label='Transcription'),
         title='Whisper Large v2 - ATCO2-ASR-ATCOSIM',
         description='This demo will transcribe ATC audio files by using the Whisper Large v2 model fine-tuned on the ATCO2 and ATCOSIM datasets. Further it uses a Named Entity Recognition model to extract callsigns, commands and values from the transcription. This model is based on Google\'s BERT model and fine-tuned on the ATCO2 dataset.',

 # bert_atco_ner = pipeline(model='Jzuluaga/bert-base-ner-atc-en-atco2-1h')
 #%%
+def transcribe(audio_file):
     if audio_file is not None:
         return whisper(audio_file)['text']
     else:
         return 'There was no audio to transcribe...'
 #%%
 iface = gr.Interface(
         fn=transcribe,
+        inputs=gr.Audio(source='upload', type='filepath'),
         outputs=gr.Text(label='Transcription'),
         title='Whisper Large v2 - ATCO2-ASR-ATCOSIM',
         description='This demo will transcribe ATC audio files by using the Whisper Large v2 model fine-tuned on the ATCO2 and ATCOSIM datasets. Further it uses a Named Entity Recognition model to extract callsigns, commands and values from the transcription. This model is based on Google\'s BERT model and fine-tuned on the ATCO2 dataset.',