Spaces:

badrex
/

arabic-dialect-identifier-demo

Running

App Files Files Community

badrex commited on 5 days ago

Commit

23545c8

1 Parent(s): dbaaa4a

add examples and update requirements.txt

Browse files

Files changed (34) hide show

app.py +59 -30
examples/07sQYGJjXp.mp3 +0 -0
examples/0Dx4G69NT1.mp3 +0 -0
examples/0EklRxI2r7.mp3 +0 -0
examples/0lhKyMVanh.mp3 +0 -0
examples/3EeaoDRPEd.mp3 +0 -0
examples/3Fi3cisTLe.mp3 +0 -0
examples/3bEPdiqxC7.mp3 +0 -0
examples/3zRKfpKl0Y.mp3 +0 -0
examples/56S1DlxtmW.mp3 +0 -0
examples/5jehSBK6Pg.mp3 +0 -0
examples/5q7nveNeiy.mp3 +0 -0
examples/67ub2dQVtY.mp3 +0 -0
examples/68jlcwwZNQ.mp3 +0 -0
examples/6D3IzKfPsg.mp3 +0 -0
examples/6fDC05Y789.mp3 +0 -0
examples/6tClWfytMf.mp3 +0 -0
examples/7hJUpVTD91.mp3 +0 -0
examples/9XiCrJdINc.mp3 +0 -0
examples/AICriJDIrA.mp3 +0 -0
examples/AT2Oo9AjZw.mp3 +0 -0
examples/BPyRgUKYav.mp3 +0 -0
examples/CbrP4lagnL.mp3 +0 -0
examples/CmBBDRsOVU.mp3 +0 -0
examples/FFAKzxhVgC.mp3 +0 -0
examples/Lionel-Messi_(arywiki)-2.mp3 +0 -0
examples/PDJbpexQFE.mp3 +0 -0
examples/bsBqTDHUgx.mp3 +0 -0
examples/bywrMXKv1a.mp3 +0 -0
examples/cLOEsibJJW.mp3 +0 -0
examples/fDyks4ZZsU.mp3 +0 -0
examples/gksGGsLoAq.mp3 +0 -0
examples/obud3p5tvb.mp3 +0 -0
requirements.txt +3 -2

app.py CHANGED Viewed

@@ -1,12 +1,18 @@
 import gradio as gr
 from transformers import pipeline
 import numpy as np
 # Load the model
-model_id = "badrex/mms-300m-arabic-dialect-identifier"  # Replace with your model ID
-classifier = pipeline("audio-classification", model=model_id)
-# Define dialect names for better display
 dialect_mapping = {
     "MSA": "Modern Standard Arabic",
     "Egyptian": "Egyptian Arabic",
@@ -16,43 +22,66 @@ dialect_mapping = {
 }
 def predict_dialect(audio):
-    # The audio input from Gradio is a tuple of (sample_rate, audio_array)
-    if isinstance(audio, tuple) and len(audio) == 2:
         sr, audio_array = audio
-    else:
-        # Handle error case
         return {"Error": 1.0}
-    # Process the audio input
-    if len(audio_array.shape) > 1:
-        audio_array = audio_array.mean(axis=1)  # Convert stereo to mono
-    # Classify the dialect
-    predictions = classifier({"sampling_rate": sr, "raw": audio_array})
-    # Format results for display
-    results = {}
-    for pred in predictions:
-        dialect_name = dialect_mapping.get(pred['label'], pred['label'])
-        results[dialect_name] = float(pred['score'])
-    return results
 # Create the Gradio interface
 demo = gr.Interface(
     fn=predict_dialect,
-    inputs=gr.Audio(),  # Simplified audio input
     outputs=gr.Label(num_top_classes=5, label="Predicted Dialect"),
     title="Arabic Dialect Identifier",
     description="""This demo identifies Arabic dialects from speech audio.
     Upload an audio file or record your voice speaking Arabic to see which dialect it matches.
     The model identifies: Modern Standard Arabic (MSA), Egyptian, Gulf, Levantine, and Maghrebi dialects.""",
-    examples=[
-        # Optional: Add example audio files here if you have them
-        # ["examples/msa_example.wav"],
-        # ["examples/egyptian_example.wav"],
-    ],
-    allow_flagging="never"
 )
 # Launch the app

 import gradio as gr
 from transformers import pipeline
 import numpy as np
+import os
 # Load the model
+print("Loading model...")
+model_id = "badrex/mms-300m-arabic-dialect-identifier"
+try:
+    classifier = pipeline("audio-classification", model=model_id)
+    print("Model loaded successfully")
+except Exception as e:
+    print(f"Error loading model: {e}")
+# Define dialect mapping
 dialect_mapping = {
     "MSA": "Modern Standard Arabic",
     "Egyptian": "Egyptian Arabic",
 }
 def predict_dialect(audio):
+    try:
+        # The audio input from Gradio is a tuple of (sample_rate, audio_array)
+        if audio is None:
+            return {"Error": 1.0}
         sr, audio_array = audio
+        # Process the audio input
+        if len(audio_array.shape) > 1:
+            audio_array = audio_array.mean(axis=1)  # Convert stereo to mono
+        print(f"Processing audio: sample rate={sr}, shape={audio_array.shape}")
+        # Classify the dialect
+        predictions = classifier({"sampling_rate": sr, "raw": audio_array})
+        # Format results for display
+        results = {}
+        for pred in predictions:
+            dialect_name = dialect_mapping.get(pred['label'], pred['label'])
+            results[dialect_name] = float(pred['score'])
+        return results
+    except Exception as e:
+        print(f"Error in prediction: {e}")
         return {"Error": 1.0}
+# Find example files
+example_files = []
+examples_dir = "examples"
+if os.path.exists(examples_dir):
+    for filename in os.listdir(examples_dir):
+        if filename.endswith((".wav", ".mp3", ".ogg")):
+            example_files.append(os.path.join(examples_dir, filename))
+    print(f"Found {len(example_files)} example files")
+else:
+    print("Examples directory not found")
+# Examples with labels
+examples = []
+if example_files:
+    for file in example_files:
+        basename = os.path.basename(file)
+        dialect = basename.split("_")[0] if "_" in basename else basename.split(".")[0]
+        label = dialect_mapping.get(dialect, dialect.capitalize())
+        examples.append([file, f"{label} Sample"])
 # Create the Gradio interface
 demo = gr.Interface(
     fn=predict_dialect,
+    inputs=gr.Audio(),
     outputs=gr.Label(num_top_classes=5, label="Predicted Dialect"),
     title="Arabic Dialect Identifier",
     description="""This demo identifies Arabic dialects from speech audio.
     Upload an audio file or record your voice speaking Arabic to see which dialect it matches.
     The model identifies: Modern Standard Arabic (MSA), Egyptian, Gulf, Levantine, and Maghrebi dialects.""",
+    examples=examples if examples else None,
+    examples_per_page=5,
+    flagging_mode=None  # Updated from allow_flagging
 )
 # Launch the app

examples/07sQYGJjXp.mp3 ADDED Viewed

Binary file (19.7 kB). View file

examples/0Dx4G69NT1.mp3 ADDED Viewed

Binary file (56.1 kB). View file

examples/0EklRxI2r7.mp3 ADDED Viewed

Binary file (25.1 kB). View file

examples/0lhKyMVanh.mp3 ADDED Viewed

Binary file (27.7 kB). View file

examples/3EeaoDRPEd.mp3 ADDED Viewed

Binary file (36.9 kB). View file

examples/3Fi3cisTLe.mp3 ADDED Viewed

Binary file (45.2 kB). View file

examples/3bEPdiqxC7.mp3 ADDED Viewed

Binary file (39.7 kB). View file

examples/3zRKfpKl0Y.mp3 ADDED Viewed

Binary file (43.5 kB). View file

examples/56S1DlxtmW.mp3 ADDED Viewed

Binary file (48.3 kB). View file

examples/5jehSBK6Pg.mp3 ADDED Viewed

Binary file (26.5 kB). View file

examples/5q7nveNeiy.mp3 ADDED Viewed

Binary file (69.6 kB). View file

examples/67ub2dQVtY.mp3 ADDED Viewed

Binary file (27.2 kB). View file

examples/68jlcwwZNQ.mp3 ADDED Viewed

Binary file (92.8 kB). View file

examples/6D3IzKfPsg.mp3 ADDED Viewed

Binary file (33.4 kB). View file

examples/6fDC05Y789.mp3 ADDED Viewed

Binary file (35.2 kB). View file

examples/6tClWfytMf.mp3 ADDED Viewed

Binary file (54.5 kB). View file

examples/7hJUpVTD91.mp3 ADDED Viewed

Binary file (25 kB). View file

examples/9XiCrJdINc.mp3 ADDED Viewed

Binary file (53.3 kB). View file

examples/AICriJDIrA.mp3 ADDED Viewed

Binary file (59.2 kB). View file

examples/AT2Oo9AjZw.mp3 ADDED Viewed

Binary file (42.6 kB). View file

examples/BPyRgUKYav.mp3 ADDED Viewed

Binary file (38.5 kB). View file

examples/CbrP4lagnL.mp3 ADDED Viewed

Binary file (51.2 kB). View file

examples/CmBBDRsOVU.mp3 ADDED Viewed

Binary file (59.9 kB). View file

examples/FFAKzxhVgC.mp3 ADDED Viewed

Binary file (40.6 kB). View file

examples/Lionel-Messi_(arywiki)-2.mp3 ADDED Viewed

Binary file (94.5 kB). View file

examples/PDJbpexQFE.mp3 ADDED Viewed

Binary file (44.3 kB). View file

examples/bsBqTDHUgx.mp3 ADDED Viewed

Binary file (50 kB). View file

examples/bywrMXKv1a.mp3 ADDED Viewed

Binary file (94.4 kB). View file

examples/cLOEsibJJW.mp3 ADDED Viewed

Binary file (99.1 kB). View file

examples/fDyks4ZZsU.mp3 ADDED Viewed

Binary file (19.5 kB). View file

examples/gksGGsLoAq.mp3 ADDED Viewed

Binary file (290 kB). View file

examples/obud3p5tvb.mp3 ADDED Viewed

Binary file (31.6 kB). View file

requirements.txt CHANGED Viewed

@@ -1,4 +1,5 @@
-gradio>=3.50.2
 transformers>=4.36.0
 torch>=2.0.0
-librosa>=0.10.1

+gradio>=5.20.0
 transformers>=4.36.0
 torch>=2.0.0
+torchaudio>=2.0.0
+librosa>=0.10.1