Spaces:

Futuresony
/

Swahili-speech-recognition

Sleeping

Futuresony commited on Feb 24

Commit

af87fba

verified ·

1 Parent(s): b3a902e

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -3,7 +3,7 @@ import torch
 import torchaudio
 from transformers import Wav2Vec2ForCTC, Wav2Vec2Processor
-# Load your model from Hugging Face
 model_name = "Futuresony/Future-sw_ASR-24-02-2025"
 processor = Wav2Vec2Processor.from_pretrained(model_name)
 model = Wav2Vec2ForCTC.from_pretrained(model_name)
@@ -29,9 +29,9 @@ def transcribe_live(microphone_audio):
 # Create Gradio interface with live microphone input
 interface = gr.Interface(
     fn=transcribe_live,
-    inputs=gr.Audio(source="microphone", type="filepath"),
     outputs="text",
-    live=True,  # Enables real-time updates
     title="Live Swahili ASR Transcription",
     description="Speak into your microphone, and the model will transcribe in real-time.",
 )
@@ -39,4 +39,3 @@ interface = gr.Interface(
 # Launch the app
 if __name__ == "__main__":
     interface.launch()

 import torchaudio
 from transformers import Wav2Vec2ForCTC, Wav2Vec2Processor
+# Load the Swahili ASR model
 model_name = "Futuresony/Future-sw_ASR-24-02-2025"
 processor = Wav2Vec2Processor.from_pretrained(model_name)
 model = Wav2Vec2ForCTC.from_pretrained(model_name)
 # Create Gradio interface with live microphone input
 interface = gr.Interface(
     fn=transcribe_live,
+    inputs=gr.Audio(sources=["microphone"], type="filepath"),
     outputs="text",
+    live=True,
     title="Live Swahili ASR Transcription",
     description="Speak into your microphone, and the model will transcribe in real-time.",
 )
 # Launch the app
 if __name__ == "__main__":
     interface.launch()