Spaces:

camparchimedes
/

nb

Build error

camparchimedes commited on Aug 25, 2024

Commit

1376856

verified ·

1 Parent(s): bdf9513

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -54,7 +54,7 @@ SIDEBAR_INFO = f"""
     <img src="{LOGO}" style="width: 100%; height: auto;"/>
 </div>
 """
-device = 0 if torch.cuda.is_available() else -1
 def convert_to_wav(filepath):
     _,file_ending = os.path.splitext(f'{filepath}')
@@ -62,12 +62,12 @@ def convert_to_wav(filepath):
     os.system(f'ffmpeg -i "{filepath}" -ar 16000 -ac 1 -c:a pcm_s16le "{audio_file}"')
     return audio_file
-pipe = pipeline("automatic-speech-recognition", model="NbAiLab/nb-whisper-large", device=device)
-def transcribe_audio(audio_file):
     start_time = time.time()
-    outputs = pipe(audio_file, return_timestamps=False, generate_kwargs={'task': 'transcribe', 'language': 'no'}) # skip_special_tokens=True
     text = outputs["text"]
     end_time = time.time()

     <img src="{LOGO}" style="width: 100%; height: auto;"/>
 </div>
 """
+device = "cuda" if torch.cuda.is_available() else "cpu"
 def convert_to_wav(filepath):
     _,file_ending = os.path.splitext(f'{filepath}')
     os.system(f'ffmpeg -i "{filepath}" -ar 16000 -ac 1 -c:a pcm_s16le "{audio_file}"')
     return audio_file
+pipe = pipeline("automatic-speech-recognition", model="NbAiLab/nb-whisper-large", chunk_length_s=30, device=device)
+def transcribe_audio(audio_file, batch_size=16):
     start_time = time.time()
+    outputs = pipe(audio_file, batch_size=batch_size, return_timestamps=False, generate_kwargs={'task': 'transcribe', 'language': 'no'}) # skip_special_tokens=True
     text = outputs["text"]
     end_time = time.time()