Spaces:

badrex
/

ASRwanda

Running on Zero

App Files Files Community

badrex commited on Jun 30

Commit

fda6e40

verified ·

1 Parent(s): 9d34c9e

Update app.py

Browse files

Files changed (1) hide show

app.py +70 -0

app.py CHANGED Viewed

	@@ -0,0 +1,70 @@

+import gradio as gr
+from transformers import pipeline
+import numpy as np
+import os
+from huggingface_hub import login
+import spaces
+HF_TOKEN = os.environ.get("HF_TOKEN")
+if HF_TOKEN:
+    login(token=HF_TOKEN)
+MODEL_ID = "badrex/ASRwanda"
+transcriber = pipeline("automatic-speech-recognition", model=MODEL_ID)
+@spaces.GPU
+def transcribe(audio):
+    sr, y = audio
+    # convert to mono if stereo
+    if y.ndim > 1:
+        y = y.mean(axis=1)
+    y = y.astype(np.float32)
+    y /= np.max(np.abs(y))
+    return transcriber({"sampling_rate": sr, "raw": y})["text"]
+examples = []
+examples_dir = "examples"
+if os.path.exists(examples_dir):
+    for filename in os.listdir(examples_dir):
+        if filename.endswith((".wav", ".mp3", ".ogg")):
+            examples.append([os.path.join(examples_dir, filename)])
+    print(f"Found {len(examples)} example files")
+else:
+    print("Examples directory not found")
+demo = gr.Interface(
+    fn=transcribe,
+    inputs=gr.Audio(),
+    outputs="text",
+    title="<div>ASRwanda 🎙️ <br>Speech Recognition for Kinyarwanda</div>",
+    description="""
+        <div class="centered-content">
+            <div>
+                <p>
+                Developed with ❤ by <a href="https://badrex.github.io/" style="color: #2563eb;">Badr al-Absi</a>
+                </p>
+                <br>
+                <p style="font-size: 15px; line-height: 1.8;">
+                 Muraho 👋🏼
+                <br>
+                <br>
+                 This is a demo for ASRwanda, a Transformer-based automatic speech recognition (ASR) system for Kinyarwanda language.
+                 The underlying ASR model was trained on 500 hours of transcribed speech provided by
+                 <https://digitalumuganda.com/" style="color: #2563eb;">Digital Umuganda</a> as part of the Kin-ASR-2025 challenge.
+                <br>
+                <p style="font-size: 15px; line-height: 1.8;">
+                Simply <strong>upload an audio file</strong> 📤 or <strong>record yourself speaking</strong> 🎙️⏺️ to try out the model!
+                </p>
+            </div>
+        </div>
+        """,
+    examples=examples if examples else None,
+    cache_examples=False,
+    flagging_mode=None,
+)
+if __name__ == "__main__":
+    demo.launch()