srinivasbilla commited on
Commit
9a83786
Β·
verified Β·
1 Parent(s): dbff21d

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -1
app.py CHANGED
@@ -2,7 +2,6 @@ from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline
2
  import torch
3
  import soundfile as sf
4
  from xcodec2.modeling_xcodec2 import XCodec2Model
5
- from IPython import display
6
  import torchaudio
7
  import spaces
8
  import gradio as gr
@@ -59,6 +58,9 @@ def infer(sample_audio_path, target_text):
59
  with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as f:
60
 
61
  waveform, sample_rate = torchaudio.load(sample_audio_path)
 
 
 
62
 
63
  # Check if the audio is stereo (i.e., has more than one channel)
64
  if waveform.size(0) > 1:
 
2
  import torch
3
  import soundfile as sf
4
  from xcodec2.modeling_xcodec2 import XCodec2Model
 
5
  import torchaudio
6
  import spaces
7
  import gradio as gr
 
58
  with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as f:
59
 
60
  waveform, sample_rate = torchaudio.load(sample_audio_path)
61
+ if len(waveform[0])/sample_rate > 15:
62
+ gr.Warning("Trimming audio to first 15secs.")
63
+ waveform = waveform[:, :sample_rate*15]
64
 
65
  # Check if the audio is stereo (i.e., has more than one channel)
66
  if waveform.size(0) > 1: