Futuresony commited on
Commit
e758b0c
·
verified ·
1 Parent(s): 8788e6c

Update asr.py

Browse files
Files changed (1) hide show
  1. asr.py +6 -5
asr.py CHANGED
@@ -4,11 +4,11 @@ import numpy as np
4
  import langid # Language detection library
5
  from transformers import Wav2Vec2ForCTC, AutoProcessor
6
 
7
- #ASR_SAMPLING_RATE = 16_000
8
- #MODEL_ID = "facebook/mms-1b-all"
9
- # openai/whisper-large-v3-turbo
10
  ASR_SAMPLING_RATE = 16_000
11
- MODEL_ID = "openai/whisper-large-v3-turbo"
 
 
 
12
 
13
  # Load MMS Model
14
  processor = AutoProcessor.from_pretrained(MODEL_ID)
@@ -59,4 +59,5 @@ def transcribe_auto(audio_data=None):
59
  ids = torch.argmax(outputs, dim=-1)[0]
60
  final_transcription = processor.decode(ids)
61
 
62
- return f"Detected Language: {detected_lang.upper()}\n\nTranscription:\n{final_transcription}"
 
 
4
  import langid # Language detection library
5
  from transformers import Wav2Vec2ForCTC, AutoProcessor
6
 
 
 
 
7
  ASR_SAMPLING_RATE = 16_000
8
+ MODEL_ID = "facebook/mms-1b-all"
9
+ # openai/whisper-large-v3-turbo
10
+ #ASR_SAMPLING_RATE = 16_000
11
+ #MODEL_ID = "openai/whisper-large-v3-turbo"
12
 
13
  # Load MMS Model
14
  processor = AutoProcessor.from_pretrained(MODEL_ID)
 
59
  ids = torch.argmax(outputs, dim=-1)[0]
60
  final_transcription = processor.decode(ids)
61
 
62
+ # return f"Detected Language: {detected_lang.upper()}\n\nTranscription:\n{final_transcription}"
63
+ return f"{final_transcription}"