Spaces:

camparchimedes
/

nb

Build error

camparchimedes commited on Aug 26, 2024

Commit

9e87cc4

verified ·

1 Parent(s): ebe1913

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -55,7 +55,7 @@ SIDEBAR_INFO = f"""
 </div>
 """
-#              ------------transcribe section------------
 @spaces.GPU()
 def convert_to_wav(filepath):
@@ -64,13 +64,20 @@ def convert_to_wav(filepath):
     os.system(f'ffmpeg -i "{filepath}" -ar 16000 -ac 1 -c:a pcm_s16le "{audio_file}"')
     return audio_file
-pipe = pipeline("automatic-speech-recognition", model="NbAiLab/nb-whisper-large", chunk_length_s=30)
 @spaces.GPU()
 def transcribe_audio(audio_file, batch_size=16):
     start_time = time.time()
-    outputs = pipe(audio_file, batch_size=batch_size, return_timestamps=False)
     end_time = time.time()
@@ -97,6 +104,7 @@ def transcribe_audio(audio_file, batch_size=16):
     return text.strip(), system_info
 #              ------------summary section------------

 </div>
 """
+# ------------transcribe section------------
 @spaces.GPU()
 def convert_to_wav(filepath):
     os.system(f'ffmpeg -i "{filepath}" -ar 16000 -ac 1 -c:a pcm_s16le "{audio_file}"')
     return audio_file
+pipe = pipeline("automatic-speech-recognition", model="NbAiLab/nb-whisper-large", chunk_length_s=30, generate_kwargs={'task': 'transcribe', 'language': 'no'})
 @spaces.GPU()
 def transcribe_audio(audio_file, batch_size=16):
+    # Load the audio file into a numpy array
+    audio = AudioSegment.from_wav(audio_file)
+    samples = np.array(audio.get_array_of_samples())
+    sample_rate = audio.frame_rate
     start_time = time.time()
+    # Transcribe the audio file
+    outputs = pipe(samples, sampling_rate=sample_rate, batch_size=batch_size, return_timestamps=False)
+    text = outputs["text"]
     end_time = time.time()
     return text.strip(), system_info
 #              ------------summary section------------