specify dtype for librosa.load, instead of cast
Browse files- whisper_online.py +2 -2
- whisper_online_server.py +3 -2
whisper_online.py
CHANGED
|
@@ -10,8 +10,8 @@ import math
|
|
| 10 |
|
| 11 |
@lru_cache
|
| 12 |
def load_audio(fname):
|
| 13 |
-
a, _ = librosa.load(fname, sr=16000)
|
| 14 |
-
return a
|
| 15 |
|
| 16 |
def load_audio_chunk(fname, beg, end):
|
| 17 |
audio = load_audio(fname)
|
|
|
|
| 10 |
|
| 11 |
@lru_cache
|
| 12 |
def load_audio(fname):
|
| 13 |
+
a, _ = librosa.load(fname, sr=16000, dtype=np.float32)
|
| 14 |
+
return a
|
| 15 |
|
| 16 |
def load_audio_chunk(fname, beg, end):
|
| 17 |
audio = load_audio(fname)
|
whisper_online_server.py
CHANGED
|
@@ -4,6 +4,7 @@ from whisper_online import *
|
|
| 4 |
import sys
|
| 5 |
import argparse
|
| 6 |
import os
|
|
|
|
| 7 |
parser = argparse.ArgumentParser()
|
| 8 |
|
| 9 |
# server options
|
|
@@ -137,8 +138,8 @@ class ServerProcessor:
|
|
| 137 |
if not raw_bytes:
|
| 138 |
break
|
| 139 |
sf = soundfile.SoundFile(io.BytesIO(raw_bytes), channels=1,endian="LITTLE",samplerate=SAMPLING_RATE, subtype="PCM_16",format="RAW")
|
| 140 |
-
audio, _ = librosa.load(sf,sr=SAMPLING_RATE)
|
| 141 |
-
out.append(audio
|
| 142 |
if not out:
|
| 143 |
return None
|
| 144 |
return np.concatenate(out)
|
|
|
|
| 4 |
import sys
|
| 5 |
import argparse
|
| 6 |
import os
|
| 7 |
+
import numpy as np
|
| 8 |
parser = argparse.ArgumentParser()
|
| 9 |
|
| 10 |
# server options
|
|
|
|
| 138 |
if not raw_bytes:
|
| 139 |
break
|
| 140 |
sf = soundfile.SoundFile(io.BytesIO(raw_bytes), channels=1,endian="LITTLE",samplerate=SAMPLING_RATE, subtype="PCM_16",format="RAW")
|
| 141 |
+
audio, _ = librosa.load(sf,sr=SAMPLING_RATE,dtype=np.float32)
|
| 142 |
+
out.append(audio)
|
| 143 |
if not out:
|
| 144 |
return None
|
| 145 |
return np.concatenate(out)
|