Alvin-Nahabwe commited on
Commit
87c3eaa
·
verified ·
1 Parent(s): d045f90

Upload app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -8
app.py CHANGED
@@ -1,5 +1,5 @@
1
  import gradio as gr
2
- from transformers import pipeline, Wav2Vec2ProcessorWithLM
3
  import os
4
 
5
  def transcribe(audio, language):
@@ -24,15 +24,10 @@ def transcribe(audio, language):
24
  "bambara": "asr-africa/mms-bambara-50-hours-mixed-bambara-dataset",
25
  }
26
 
27
- if language in ["hausa", "igbo", "yoruba"]:
28
- revision = "lm"
29
- else:
30
- revision = "main"
31
-
32
  # load processor
33
- p = Wav2Vec2ProcessorWithLM.from_pretrained(model_map[language], revision=revision)
34
  # load eval pipeline
35
- asr = pipeline("automatic-speech-recognition", model=model_map[language], tokenizer=p.tokenizer, feature_extractor=p.feature_extractor, decoder=p.decoder, token=os.getenv('HF_TOKEN'), device=0)
36
 
37
  text = asr(audio)["text"]
38
  return text
 
1
  import gradio as gr
2
+ from transformers import pipeline, AutoProcessor
3
  import os
4
 
5
  def transcribe(audio, language):
 
24
  "bambara": "asr-africa/mms-bambara-50-hours-mixed-bambara-dataset",
25
  }
26
 
 
 
 
 
 
27
  # load processor
28
+ p = AutoProcessor.from_pretrained(model_map[language])
29
  # load eval pipeline
30
+ asr = pipeline("automatic-speech-recognition", model=model_map[language], tokenizer=p.tokenizer, feature_extractor=p.feature_extractor, decoder=p.decoder, device=0, token=os.getenv('HF_TOKEN'))
31
 
32
  text = asr(audio)["text"]
33
  return text