Spaces:

camparchimedes
/

nb

Build error

camparchimedes commited on Sep 3, 2024

Commit

5dae7d4

verified ·

1 Parent(s): 1622cb0

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -54,9 +54,9 @@ device = torch.device('cuda')
 #device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
 #@spaces.GPU
-def transcribe(microphone, file_upload, progress=gr.Progress(track_tqdm=True)):
-    file = microphone if microphone is not None else file_upload
     start_time = time.time()
     #--------------____________________________________________--------------"
@@ -67,6 +67,23 @@ def transcribe(microphone, file_upload, progress=gr.Progress(track_tqdm=True)):
     with torch.no_grad():
         pipe = pipeline("automatic-speech-recognition", model="NbAiLab/nb-whisper-large", device=device)
     text = pipe(file)["text"]

 #device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
 #@spaces.GPU
+def transcribe(file_upload, progress=gr.Progress(track_tqdm=True)): # microphone
+    file = file_upload # microphone if microphone is not None else
     start_time = time.time()
     #--------------____________________________________________--------------"
     with torch.no_grad():
         pipe = pipeline("automatic-speech-recognition", model="NbAiLab/nb-whisper-large", device=device)
+    """
+    # -- chunking
+    chunks = chunk_audio(file, chunk_length_ms=30000, overlap_length_ms=5000)
+    full_transcription = []
+    for chunk in chunks:
+        # -- convert chunk to temporary file-like object
+        temp_audio = chunk.export(format="wav")
+        # -- transcribe chunk
+        text = pipe(temp_audio)["text"]
+        full_transcription.append(text)
+    # -- join chunk transcriptions
+    full_text = " ".join(full_transcription)
+    """
     text = pipe(file)["text"]