Alvin-Nahabwe commited on
Commit
a355d31
·
1 Parent(s): a5e00c1

Added configuration files

Browse files
Files changed (4) hide show
  1. README.md +8 -2
  2. app.py +30 -0
  3. packages.txt +14 -0
  4. requirements.txt +8 -0
README.md CHANGED
@@ -8,6 +8,12 @@ sdk_version: 4.42.0
8
  app_file: app.py
9
  pinned: false
10
  license: cc-by-nc-sa-4.0
 
 
 
 
 
 
 
 
11
  ---
12
-
13
- Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference
 
8
  app_file: app.py
9
  pinned: false
10
  license: cc-by-nc-sa-4.0
11
+ models:
12
+ - asr-africa/wav2vec2-xls-r-1b-naijavoices-hausa-500hr-v0
13
+ - asr-africa/wav2vec2-xls-r-1b-naijavoices-igbo-500hr-v0
14
+ - asr-africa/wav2vec2-xls-r-1b-naijavoices-yoruba-500hr-v0
15
+ datasets:
16
+ - mozilla-foundation/common_voice_17_0
17
+ - naijavoices/naijavoices-dataset
18
+ - google/fleurs
19
  ---
 
 
app.py ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import gradio as gr
2
+ from transformers import pipeline, Wav2Vec2ProcessorWithLM
3
+
4
+ def transcribe(audio, model_id):
5
+ # load processor
6
+ p = Wav2Vec2ProcessorWithLM.from_pretrained(model_id, revision="lm")
7
+ # load eval pipeline
8
+ asr = pipeline("automatic-speech-recognition", model=model_id, tokenizer=p.tokenizer, feature_extractor=p.feature_extractor, decoder=p.decoder)
9
+
10
+ text = asr(audio)["text"]
11
+ return text
12
+
13
+ asr_app = gr.Interface(
14
+ fn=transcribe,
15
+ inputs=[
16
+ gr.Audio(sources=["upload", "microphone"], type="filepath"),
17
+ gr.Dropdown(
18
+ [
19
+ "asr-africa/wav2vec2-xls-r-1b-naijavoices-hausa-500hr-v0",
20
+ "asr-africa/wav2vec2-xls-r-1b-naijavoices-igbo-500hr-v0",
21
+ "asr-africa/wav2vec2-xls-r-1b-naijavoices-yoruba-500hr-v0"
22
+ ]
23
+ )
24
+ ],
25
+ outputs="text",
26
+ title="NaijaVoices ASR",
27
+ description="Realtime demo for Hausa, Igbo and Yoruba speech recognition using a fine-tuned Wav2Vec-XLS-R 1B model.",
28
+ )
29
+
30
+ asr_app.launch()
packages.txt ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ libavcodec-extra
2
+ sox
3
+ libsndfile1
4
+ build-essential
5
+ libboost-system-dev
6
+ libboost-thread-dev
7
+ libboost-program-options-dev
8
+ libboost-test-dev
9
+ libeigen3-dev
10
+ zlib1g-dev
11
+ libbz2-dev
12
+ liblzma-dev
13
+ git-lfs
14
+ tree
requirements.txt ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ transformers
2
+ torch
3
+ torchaudio
4
+ accelerate
5
+ soundfile
6
+ librosa
7
+ pyctcdecode
8
+ https://github.com/kpu/kenlm/archive/master.zip