Spaces:
Sleeping
Sleeping
Upload app.py
Browse files
app.py
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
import gradio as gr
|
2 |
-
from transformers import pipeline,
|
3 |
import os
|
4 |
|
5 |
def transcribe(audio, language):
|
@@ -24,15 +24,10 @@ def transcribe(audio, language):
|
|
24 |
"bambara": "asr-africa/mms-bambara-50-hours-mixed-bambara-dataset",
|
25 |
}
|
26 |
|
27 |
-
if language in ["hausa", "igbo", "yoruba"]:
|
28 |
-
revision = "lm"
|
29 |
-
else:
|
30 |
-
revision = "main"
|
31 |
-
|
32 |
# load processor
|
33 |
-
p =
|
34 |
# load eval pipeline
|
35 |
-
asr = pipeline("automatic-speech-recognition", model=model_map[language], tokenizer=p.tokenizer, feature_extractor=p.feature_extractor, decoder=p.decoder, token=os.getenv('HF_TOKEN')
|
36 |
|
37 |
text = asr(audio)["text"]
|
38 |
return text
|
|
|
1 |
import gradio as gr
|
2 |
+
from transformers import pipeline, AutoProcessor
|
3 |
import os
|
4 |
|
5 |
def transcribe(audio, language):
|
|
|
24 |
"bambara": "asr-africa/mms-bambara-50-hours-mixed-bambara-dataset",
|
25 |
}
|
26 |
|
|
|
|
|
|
|
|
|
|
|
27 |
# load processor
|
28 |
+
p = AutoProcessor.from_pretrained(model_map[language])
|
29 |
# load eval pipeline
|
30 |
+
asr = pipeline("automatic-speech-recognition", model=model_map[language], tokenizer=p.tokenizer, feature_extractor=p.feature_extractor, decoder=p.decoder, device=0, token=os.getenv('HF_TOKEN'))
|
31 |
|
32 |
text = asr(audio)["text"]
|
33 |
return text
|