Spaces:

Aekanun
/

ThaiSpeech-to-Text-v1.0

Running on Zero

Aekanun commited on Dec 1, 2024

Commit

25d528b

1 Parent(s): 24fa852

rev app

Files changed (1) hide show

app.py CHANGED Viewed

@@ -8,7 +8,7 @@ model = pipeline(
     "automatic-speech-recognition",
     model="Aekanun/whisper-small-hi",
     device="cpu",
-    torch_dtype=torch.float16  # กำหนด data type เป็น float16
 )
 @spaces.GPU
@@ -19,11 +19,15 @@ def transcribe_speech(audio):
             return "กรุณาบันทึกเสียงก่อน"
         # Move model to GPU with float16
-        model.model = model.model.to("cuda").half()  # ใช้ .half() เพื่อแปลงเป็น float16
         with torch.amp.autocast('cuda'):
-            # Process audio
-            result = model(audio, batch_size=1)
             # Get text result
             text = result["text"] if isinstance(result, dict) else result

     "automatic-speech-recognition",
     model="Aekanun/whisper-small-hi",
     device="cpu",
+    torch_dtype=torch.float16
 )
 @spaces.GPU
             return "กรุณาบันทึกเสียงก่อน"
         # Move model to GPU with float16
+        model.model = model.model.to("cuda").half()
         with torch.amp.autocast('cuda'):
+            # Process audio with chunk_length_s
+            result = model(
+                audio,
+                batch_size=1,
+                chunk_length_s=30  # แบ่งเสียงเป็นช่วงละ 30 วินาที
+            )
             # Get text result
             text = result["text"] if isinstance(result, dict) else result