Spaces:

camparchimedes
/

nb

Build error

camparchimedes commited on Aug 11, 2024

Commit

9769005

verified ·

1 Parent(s): 01ca89f

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -24,26 +24,33 @@ import torch
 from transformers import pipeline, AutoProcessor # AutoModelForSpeechSeq2Seq
 device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
-pipe = pipeline("automatic-speech-recognition", model="NbAiLabBeta/nb-whisper-large", device=device, torch_dtype=torch.float32)
 # @spaces.GPU(queue=True)
-# Initialize processor before using it in the function
 processor = AutoProcessor.from_pretrained("NbAiLabBeta/nb-whisper-large")
 language = "no"
 task = "transcribe"
-def transcribe_audio(audio_file, forced_decoder_ids):
     if audio_file.endswith(".m4a"):
         audio_file = convert_to_wav(audio_file)
     start_time = time.time()
-    forced_decoder_ids = processor.get_decoder_prompt_ids(language="no", task="transcribe")
     with torch.no_grad():
-        output = pipe(audio_file, chunk_length_s=30, generate_kwargs={"forced_decoder_ids": forced_decoder_ids})
     text = output["text"]
     end_time = time.time()
@@ -204,7 +211,7 @@ def save_to_pdf(text, summary):
 banner_html = """
 <div style="text-align: center;">
-    <img src="https://huggingface.co/spaces/camparchimedes/transcription_app/blob/main/Olas%20AudioSwitch%20Shop.png" alt="Banner" width="100%" height="auto">
 </div>
 """

 from transformers import pipeline, AutoProcessor # AutoModelForSpeechSeq2Seq
 device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
+torch_dtype = torch.float32
+pipe = pipeline("automatic-speech-recognition", model="NbAiLabBeta/nb-whisper-large", device=device, torch_dtype=torch_dtype)
 # @spaces.GPU(queue=True)
+# Initialize processor and pipeline
 processor = AutoProcessor.from_pretrained("NbAiLabBeta/nb-whisper-large")
+device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
+torch_dtype = torch.float32
 language = "no"
 task = "transcribe"
+def transcribe_audio(audio_file):
     if audio_file.endswith(".m4a"):
         audio_file = convert_to_wav(audio_file)
     start_time = time.time()
+    # forced_decoder_ids@the correct context
+    forced_decoder_ids = processor.get_decoder_prompt_ids(language=language, task=task)
     with torch.no_grad():
+        # CUDA@function -->
+        with torch.cuda.device(device) if torch.cuda.is_available() else contextlib.nullcontext():
+            output = pipe(audio_file, chunk_length_s=30, generate_kwargs={"forced_decoder_ids": forced_decoder_ids})
     text = output["text"]
     end_time = time.time()
 banner_html = """
 <div style="text-align: center;">
+    <img src="https://huggingface.co/spaces/camparchimedes/transcription_app/blob/main/Olas%20AudioSwitch%20Shop.png" width="100%" height="auto">
 </div>
 """