asr-inference

Running on Zero

App Files Files Community

federicocosta1989 commited on 4 days ago

Commit

10107b2

verified ·

1 Parent(s): 705a23b

Update whisper_cs_dev.py

Browse files

Deleted the fake model hack

Files changed (1) hide show

whisper_cs_dev.py +5 -20

whisper_cs_dev.py CHANGED Viewed

@@ -11,7 +11,7 @@ from pathlib import Path
 import glob
 import ctypes
-from settings import DEBUG_MODE, MODEL_PATH_V2_FAST, MODEL_PATH_V2, LEFT_CHANNEL_TEMP_PATH, RIGHT_CHANNEL_TEMP_PATH, FAKE_AUDIO_PATH, RESAMPLING_FREQ
 def load_cudnn():
@@ -93,15 +93,9 @@ def load_model(use_v2_fast, device, compute_type):
             device = device,
         )
-    # HACK we need to do this for strange reasons.
-    # If we don't do this, we get:
-    #Could not load library libcudnn_ops_infer.so.8. Error: libcudnn_ops_infer.so.8: cannot open shared object file: No such file or directory
-    #fake_model = whisper_ts.load_model(MODEL_PATH_V2, device=device)
-    fake_model = None
     if DEBUG_MODE: print(f"Exiting load_model function...")
-    return model, fake_model
 def split_input_stereo_channels(audio_path):
@@ -202,19 +196,10 @@ def transcribe_audio_no_fast_model(model, audio_path):
     if DEBUG_MODE: print(f"Exited transcribe_audio_no_fast_model function.")
-def transcribe_channels(left_waveform, right_waveform, model, use_v2_fast, fake_model):
     if DEBUG_MODE: print(f"Entering transcribe_channels function...")
-    # HACK we need to do this for strange reasons.
-    # If we don't do this, we get:
-    #Could not load library libcudnn_ops_infer.so.8. Error: libcudnn_ops_infer.so.8: cannot open shared object file: No such file or directory
-    #fake_result = whisper_ts.transcribe(
-    #    fake_model,
-    #    FAKE_AUDIO_PATH,
-    #    beam_size=1,
-    #)
     if DEBUG_MODE: print(f"Preparing to transcribe...")
     if use_v2_fast:
@@ -354,10 +339,10 @@ def generate(audio_path, use_v2_fast):
     load_cudnn()
     device, compute_type = get_settings()
-    model, fake_model = load_model(use_v2_fast, device, compute_type)
     split_input_stereo_channels(audio_path)
     left_waveform, right_waveform = process_waveforms()
-    left_result, right_result = transcribe_channels(left_waveform, right_waveform, model, use_v2_fast, fake_model)
     output = post_process_transcripts(left_result, right_result, use_v2_fast)
     cleanup_temp_files(LEFT_CHANNEL_TEMP_PATH, RIGHT_CHANNEL_TEMP_PATH)

 import glob
 import ctypes
+from settings import DEBUG_MODE, MODEL_PATH_V2_FAST, MODEL_PATH_V2, LEFT_CHANNEL_TEMP_PATH, RIGHT_CHANNEL_TEMP_PATH, RESAMPLING_FREQ
 def load_cudnn():
             device = device,
         )
     if DEBUG_MODE: print(f"Exiting load_model function...")
+    return model
 def split_input_stereo_channels(audio_path):
     if DEBUG_MODE: print(f"Exited transcribe_audio_no_fast_model function.")
+def transcribe_channels(left_waveform, right_waveform, model, use_v2_fast):
     if DEBUG_MODE: print(f"Entering transcribe_channels function...")
     if DEBUG_MODE: print(f"Preparing to transcribe...")
     if use_v2_fast:
     load_cudnn()
     device, compute_type = get_settings()
+    model = load_model(use_v2_fast, device, compute_type)
     split_input_stereo_channels(audio_path)
     left_waveform, right_waveform = process_waveforms()
+    left_result, right_result = transcribe_channels(left_waveform, right_waveform, model, use_v2_fast)
     output = post_process_transcripts(left_result, right_result, use_v2_fast)
     cleanup_temp_files(LEFT_CHANNEL_TEMP_PATH, RIGHT_CHANNEL_TEMP_PATH)