aar2dee2 commited on
Commit
3e9b592
·
1 Parent(s): 12940e9

return numpy output of audio

Browse files
Files changed (1) hide show
  1. app.py +3 -8
app.py CHANGED
@@ -7,7 +7,6 @@ from vocode import getenv
7
  import gradio as gr
8
  import os
9
  import logging
10
- import sounddevice as sd
11
  from vocode.turn_based.agent.chat_gpt_agent import ChatGPTAgent
12
  from vocode.turn_based.synthesizer import CoquiSynthesizer
13
  from vocode.turn_based.transcriber.whisper_transcriber import WhisperTranscriber
@@ -88,16 +87,12 @@ def convert_to_audio_segment(input_audio):
88
  def send_audio(audio_segment: AudioSegment):
89
  logger.info("now processing output")
90
  sampling_rate = DEFAULT_SAMPLING_RATE
91
- stream = sd.OutputStream(
92
- channels=1,
93
- samplerate=sampling_rate,
94
- dtype=np.int16,
95
- device=None,
96
- )
97
  raw_data = audio_segment.raw_data
98
  if audio_segment.frame_rate != sampling_rate:
99
  raw_data = audio_segment.set_frame_rate(sampling_rate).raw_data
100
- return stream.write(np.frombuffer(raw_data, dtype=np.int16))
 
 
101
 
102
 
103
  def main(input_audio):
 
7
  import gradio as gr
8
  import os
9
  import logging
 
10
  from vocode.turn_based.agent.chat_gpt_agent import ChatGPTAgent
11
  from vocode.turn_based.synthesizer import CoquiSynthesizer
12
  from vocode.turn_based.transcriber.whisper_transcriber import WhisperTranscriber
 
87
  def send_audio(audio_segment: AudioSegment):
88
  logger.info("now processing output")
89
  sampling_rate = DEFAULT_SAMPLING_RATE
 
 
 
 
 
 
90
  raw_data = audio_segment.raw_data
91
  if audio_segment.frame_rate != sampling_rate:
92
  raw_data = audio_segment.set_frame_rate(sampling_rate).raw_data
93
+ output = np.frombuffer(raw_data, dtype=np.int16)
94
+
95
+ return output
96
 
97
 
98
  def main(input_audio):